from feature_data.XmlData2DictData import Xml2Dict
from feature_data.const_data import *
from nd_utils.Graph_Cluster_util import get_org_str

xml_file_name_list = [

        xml_file_name1
    ]
"""
 xml_file_name1,
        xml_file_name2,
        xml_file_name3,
        xml_file_name4,
        xml_file_name5,
        xml_file_name6,
        xml_file_name7,
        xml_file_name8,
        xml_file_name9,
"""
paper_org_set = set()
for xml_file_name in xml_file_name_list:

    xml2dict = Xml2Dict(xml_dir + xml_file_name)

    publication_dict = xml2dict.publication_dict

    for paperid, publication_attr_dict in publication_dict.items():
        org = publication_attr_dict['organization']
        paper_org_set.add(org)

paper_org_set = sorted(list(paper_org_set))

for org in paper_org_set:
    print org
    print get_org_str(org)
    print "======"